@misc{MVAPICH:homepage,
  author =   "{Network-Based Computing Laboratory}",
  title =    "{MVAPICH/MVAPICH2: MPI-1/MPI-2 for InfiniBand and 
	iWARP with OpenFabrics}",
  howpublished =  "http://mvapich.cse.ohio-state.edu/"
}

@InProceedings{AMMASSOU,
  title = "{Ammasso Incorporation}",
  howpublished = "http://www.ammasso.com"
}

@misc{OpenMPI:homepage,         
  author =       "{OpenMPI}",
  title =        "{Open Source High Performance Computing}",
  howpublished = "http://www.open-mpi.org/"
}

@misc{STOMP:homepage,         
  author =       "{Subsurface Transport over Multiple Phases}",
  title =        "{STOMP}",
  howpublished = "http://stomp.pnl.gov/"
}
@misc{myricom,
  title =        "{Myricom Corporation}",
  howpublished = "http://www.myri.com/"
}

@misc{atlas:llnl,
  title =        "{ATLAS SuperComputer, Lawrence Livermore National Lab}",
  howpublished = "http://computing.llnl.gov/"
}

@misc{chinook:pnl,
  title =        "{Chinook SuperComputer, Environmental Molecular Science Lab, PNNL}",
  howpublished = "http://emsl.pnl.gov"
}

@misc{mellanox,
  title =        "{Mellanox Technologies}",
  howpublished = "http://www.mellanox.com/"
}

@misc{voltaire,
  title =        "{Voltaire Technologies}",
  howpublished = "http://www.voltaire.com/"
}

@misc{tacc,
  title =        "{Texas Advanced Computing Center}",
  howpublished = "http://www.tacc.utexas.edu/"
}

@misc{hpcs,
  title =        "{DARPA High Productivity Computer Systems}",
  howpublished = "http://www.highproductivity.org/"
}

@misc{quadrics,
  title =        "{Quadrics Corporation}",
  howpublished = "http://www.quadrics.com/"
}

@misc{chelsio,
  title =        "{Chelsio Communications}",
  howpublished = "http://www.chelsio.com/"
}

@misc{IBA:SPEC,
  author =       "{InfiniBand Trade Association}",
  title  =       "{InfiniBand Architecture Specification, Release 1.2}",
  month  =       "October",
  year   =       "2004"
}

@misc{PSTSWM,
  title =        "{Parallel Spectral Transform Shallow Water Model}",
  howpublished = "http://www.csm.ornl.gov/chammp/pstswm/"
}

@misc{TOP500,
  title =        "{TOP500 Supercomputing Sites}",
  howpublished = "http://www.top500.org"
} 

@article{yan:aina06,
        author = "S. Yan and G. Min and I. Awan",
        title = "{An Enhanced Congestion Control Mechanism in 
	InfiniBand Networks for High Performance Computing Systems}",
        journal = {Advanced Information Networking and Applications},
        volume = {1},
        year = {2006},
        issn = {1550-445X},
        pages = {845-850},
        publisher = {IEEE Computer Society},
}       

@inproceedings{gusat:hoti05,
  author    = {M. Gusat and
               D. Craddock and
               W. Denzel and
               T. Engbersen and
               N. Ni and
               G. Pfister and
               W. Rooney and
               Jos{\'e} Duato},
  title     = "{Congestion Control in InfiniBand Networks}",
  booktitle = {Hot Interconnects},
  pages     = {158-159},
  year      = {2005},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{santos:infocom03,
  author    = {J. R. Santos and
               Y. Turner and
               G. J. Janakiraman},
  title     = "{End-to-End Congestion Control for InfiniBand}",
  booktitle = {InfoComm},
  year      = {2003},
  pages     = "1123--1133",
  ee        = {http://www.ieee-infocom.org/2003/papers/28_01.PDF},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{sanjay:wsc01,                                                            author = {Sanjay Shakkottai and R. Srikant},
 title = {Deterministic fluid models of congestion control 
	in high-speed networks},
 booktitle = {WSC '01: Proceedings of the 33nd conference on Winter simulation},
 year = {2001},  
 isbn = {0-7803-7309-X},
 pages = {1275--1281},
location = {Arlington, Virginia},
publisher = {IEEE Computer Society}
}


 
@inproceedings{jacobson:sigcomm88, 
    author = "V. Jacobson",                        
    title = "{Congestion Avoidance and Control}",
    booktitle = "{ACM} {SIGCOMM} ",                       
    year = "1988",
    url = "citeseer.ist.psu.edu/jacobson88congestion.html" 
}


@article{201214,
 author = "{Gregory F. Pfister and V. Alan Norton}",
 title = "{Hot spot Contention and Combining in Multistage Interconnection Networks}",
 Journal = {Interconnection networks for high-performance parallel computers},
 year = {1994},
 isbn = {0-8186-6197-6},
 pages = {276--281},
 publisher = {IEEE Computer Society Press},
 }

@article{puente:tpds0607,
	author = {Valentin Puente and Jose Angel Gregorio},
	title = {Immucube: Scalable Fault-Tolerant Routing for k-ary n-cube Networks},
	journal = {IEEE Transactions on Parallel and Distributed Systems},
	volume = {18},
	number = {6},
	year = {2007},
	issn = {1045-9219},
	pages = {776-788},
	publisher = {IEEE Computer Society},
}

@article{kim:tpds0407,
  author    = {E. Kim and
               K. H. Yum and
               C. R. Das and
               M. S. Yousif and
               J. Duato},
  title     = "{Exploring IBA Design Space for Improved Performance}",
  journal   = {IEEE Transactions on Parallel and Distributed Systems},
  volume    = {18},
  number    = {4},
  year      = {2007},
  pages     = {498-510}
}

@article{bermudez:tpds0207,
  author    = {Aurelio Berm{\'u}dez and
               Rafael Casado and
               Francisco J. Quiles and
               Jos{\'e} Duato},
  title     = {Handling Topology Changes in InfiniBand.},
  journal   = {IEEE Transactions on Parallel Distributed Systems},
  volume    = {18},
  number    = {2},
  year      = {2007},
  pages     = {172-185},
  ee        = {http://doi.ieeecomputersociety.org/10.1109/TPDS.2007.26}
}

@article{gomez:tpds0406,
	author = {Maria Engracia Gomez and 
		  Nils Agne Nordbotten and 
		  Jose Flich and Pedro Lopez and 
		  Antonio Robles and Jose Duato and 
		  Tor Skeie and Olav Lysne},
	title = {A Routing Methodology for Achieving Fault 
		Tolerance in Direct Networks},
	journal = {IEEE Transactions on Computers},
	volume = {55},
	number = {4},
	year = {2006},
	issn = {0018-9340},
	pages = {400-415},
	publisher = {IEEE Computer Society},
}


@inproceedings{yu:sc06,
	author = {Hao Yu and I-Hsin Chung and Jose Moreira},
	title = {Blue Gene system software---Topology mapping 
		for Blue Gene/L supercomputer},
	booktitle = {SC '06: Proceedings of the 2006 
			ACM/IEEE conference on Supercomputing},
	year = {2006},
	isbn = {0-7695-2700-0},
	pages = {116},
	location = {Tampa, Florida},
	publisher = {ACM Press},
}

@inproceedings{nachiondo:icpads06,
	author = {T. Nachiondo and J. Flich and J. Duato},
	title = "{Destination-Based HoL Blocking Elimination}",
	booktitle = {ICPADS '06: Proceedings of the 12th International Conference 
			on Parallel and Distributed Systems},
	year = {2006},
	isbn = {0-7695-2612-8},
	pages = {213--222},
	publisher = {IEEE Computer Society},
}

@article{brightwell:micro06,
	author = {Ron Brightwell and Kevin T. Pedretti and 
		Keith D. Underwood and Trammell Hudson},
	title = {SeaStar Interconnect: Balanced Bandwidth for Scalable Performance},
	journal = {IEEE Micro},
	volume = {26},
	number = {3},
	year = {2006},
	issn = {0272-1732},
	pages = {41--57},
	publisher = {IEEE Computer Society Press},
}


@book{duato:book,
	author = "J. Duato and S. Yalamanchili and L. Ni",
	title  = "{Interconnection Networks: An Engineering Approach}",
	publisher = "The IEEE Computer Society Press",                                        year   = "1997"
} 

@InProceedings{icpp03,
author= { J.C. Sancho and A. Robles and P. Lopez and J. Flich and J. Duato },
title={ Routing in InfiniBand Torus Network Topologies },
booktitle= {2003 International Conference on Parallel Processing (ICPP'2003)},
year= {2003},
series= {IEEE Computer Society Press}
}

@InProceedings{duato:ipdps03,
	author = {J. C. Martinez and J. Flich and A. Robles and P. Lopez and J. Duato},
	title = "{Supporting Fully Adaptive Routing in InfiniBand Networks}",
	booktitle = {Proceedings of the 17th International Symposium on
		Parallel and Distributed Processing},
	year = {2003},
}

@inproceedings{sancho:icpp02,
	author = {J. C. Sancho and A. Robles and J. Flich and P. Lopez and J. Duato},
	title = "{Effective Methodology for Deadlock-Free Minimal 
Routing in InfiniBand Networks}",
	booktitle = {ICPP '02: Proceedings of the 2002 International 
Conference on Parallel Processing (ICPP'02)},
	year = {2002},
	isbn = {0-7695-1677-7},
	pages = {409},
}

@book{vipin:book,
	author = "V. Kumar and A. Grama and A. Gupta and G. Karypis",
	title = "{Introduction to Parallel Computing: Design and Analysis of Algorithms}",
	year = {1994},
	isbn = {0-8053-3170-0},
	publisher = {Benjamin-Cummings Publishing Co.},
	address = {Redwood City, CA, USA},
}

@inproceedings{sancho:europar00,
	author = {J. C. Sancho and A. Robles},
	title = "{Improving the Up*/Down* Routing Scheme for Networks of Workstations}",
	booktitle = {Euro-Par '00: Proceedings from the 6th International Euro-Par Conference on Parallel Processing},
	year = {2000},
	isbn = {3-540-67956-1},
	pages = {882--889}
}

@inproceedings{lopez:icpp01,
	author = {P. Lopez and J. Flich and J. Duato},
	title = "{Deadlock-Free Routing in InfiniBand through Destination Renaming}",
	booktitle = {ICPP '02: Proceedings of the 2001 International Conference on Parallel Processing},
	year = {2001},
	isbn = {0-7695-1257-7},
	pages = {427--436}
}

@inproceedings{sancho:icpp01,
	author = {J. C. Sancho and A. Robles and J. Duato},
	title = "{Effective Strategy to Compute Forwarding Tables for InfiniBand Networks}",
	booktitle = {ICPP '02: Proceedings of the 2001 International Conference on Parallel Processing},
	year = {2001},
	isbn = {0-7695-1257-7},
	pages = {48--60}
}

@inproceedings{sancho:caanpc00,
	author = "J. C. Sancho and A. Robles and J. Duato",
	title = "{A New Methodology to Computer Deadlock-Free Routing
		Tables for Irregular Networks}",
	booktitle = "Communication, Architecture, and Applications for
		Network-Based Parallel Computing",
	pages = "45--60",
	year = "2000"
}


@inproceedings{flich:ipdps00,
  author    = {Jose Flich and
               Manuel P. Malumbres and
               Pedro L{\'o}pez and
               Jos{\'e} Duato},
  title     = {Improving Routing Performance in Myrinet Networks},
  booktitle = {IPDPS},
  year      = {2000},
  pages     = {27-32}
}

@article{fattreeclassic,
  author    = "C. E. Leiserson",
  title     = "{Fat-Trees: Universal Networks for Hardware-Efficient Supercomputing}",
  journal   = {IEEE Transactions on Computers},
  volume    = {34},
  number    = {10},
  year      = {1985},
  pages     = {892-901},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}
@inproceedings{narravul:icpp07,
  author    = "S. Narravula and
               A. Mamidala and
               A. Vishnu and
               G. Santhanaraman and
               D. K. Panda",
  title     = "{High Performance MPI over iWARP: Early Experiences}",
  booktitle = {International Conference on Parallel Processing},
  year      = {2007},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{vishnu:ccgrid10,
  author    = "A. Vishnu and
               M. Krishnan",
  title     = "{Efficient On-demand Connection Management Protocols with PGAS Models over InfiniBand}",
  booktitle = {International Conference on Cluster, Cloud and Grid Computing},
  year      = {2010},
}

@inproceedings{vishnu:icpp10,
		  author    = "A. Vishnu and
				                 M. Krishnan",
		    title     = "{ACTS: Advanced Connection Teardown Schemes with PGAS Models for InfiniBand Clusters}",
			  booktitle = {In submission, International Conference on Parallel Processing},
			    year      = {2010},
}

@inproceedings{vishnu:ccgrid07,
  author    = "A. Vishnu and
               M. J. Koop and
               A. Moody and
               A. R. Mamidala and
               S. Narravula and
               D. K. Panda",
  title     = "{Hot-Spot Avoidance With Multi-Pathing Over InfiniBand: An
               MPI Perspective}",
  booktitle = {Cluster Computing and Grid},
  year      = {2007},
  pages     = {479-486},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{vishnu:cluster09,
  author    = "A. Vishnu and
			   M. K. Krishnan,
				D. K. Panda",
  title     = "{A Hardware-Software Approach to Network Fault Tolerance wwith InfiniBand Cluster}",
  booktitle = {International Conference on Cluster Computing},
  year      = {2009},
  pages     = {479-486},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{dinan:sc09,
		author = {Dinan, James and Larkins, D. Brian and Sadayappan, P. and Krishnamoorthy, Sriram and Nieplocha, Jarek},
		title = {Scalable work stealing},
		booktitle = {SC '09: Proceedings of the Conference on High Performance Computing Networking, Storage and Analysis},
		year = {2009},
		isbn = {978-1-60558-744-8},
		pages = {1--11},
		location = {Portland, Oregon},
		publisher = {ACM},
		address = {New York, NY, USA},
}

@inproceedings{balaji:europvm09,
		author = {Balaji, Pavan and Buntinas, Darius and Goodell, David
				and Gropp, William and Kumar, Sameer and Lusk, Ewing
						and Thakur, Rajeev and Tr\"{a}ff, Jesper
						Larsson},
		title = {MPI on a Million Processors},
		booktitle = {Proceedings of the 16th European PVM/MPI Users'
				Group Meeting on Recent Advances in Parallel Virtual
						Machine and Message Passing Interface},
		year = {2009},
		pages = {20--30},
		location = {Espoo, Finland},
		publisher = {Springer-Verlag},
		address = {Berlin, Heidelberg},
}

@inproceedings{vishnu:12x,
  author    = "A. Vishnu and
               B. Benton and
               D. K. Panda",
  title     = "{High Performance MPI on IBM 12x InfiniBand  Architecture}",
  booktitle = {International Workshop on High-Level Parallel Programming Models and
  Supportive Environments, held in conjunction with IPDPS '07 (HIPS'07)},
  year      = {2007},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{vishnu:smtps07,
        author = {A. Vishnu and A. Mamidala and S. Narravula and D. K. Panda},
        title = "{Automatic Path Migration over InfiniBand: Early Experiences}",
        year = 2007,
        month = "March",
	booktitle = {Proceedings of Third International Workshop on System
		Management Techniques, Processes, and Services, held in conjunction with 		IPDPS'07}
}

@inproceedings{narravul:ccgrid07-1,
  author    = {Sundeep Narravula and
               A. Marnidala and
               Abhinav Vishnu and
               Karthikeyan Vaidyanathan and
               Dhabaleswar K. Panda},
  title     = {High Performance Distributed Lock Management Services using
               Network-based Remote Atomic Operations.},
  booktitle = {CCGRID},
  year      = {2007},
  pages     = {583-590},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{mamidala:ppopp07,
  author    = {Amith R. Mamidala and
               Sundeep Narravula and
               Abhinav Vishnu and
               Gopalakrishnan Santhanaraman and
               Dhabaleswar K. Panda},
  title     = "{On using Connection-Oriented vs. Connection-Less Transport
               for Performance and Scalability of Collective and One-sided
               Operations: Trade-offs and Impact}",
  booktitle = {PPOPP},
  year      = {2007},
  pages     = {46-54},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{mamidala:europvm06,
  author    = {Amith R. Mamidala and
               Abhinav Vishnu and
               Dhabaleswar K. Panda},
  title     = {Efficient Shared Memory and RDMA Based Design for MPI_Allgather
               over InfiniBand.},
  booktitle = {PVM/MPI},
  year      = {2006},
  pages     = {66-75},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{vishnu:sc06-1,
  author    = {Abhinav Vishnu and
               Prachi Gupta and
               Amith R. Mamidala and
               Dhabaleswar K. Panda},
  title     = "{A Software Based Approach for
               Providing Network Fault Tolerance in Clusters with uDAPL
               Interface: MPI Level Design and Performance Evaluation}",
  booktitle = {SuperComputing},
  year      = {2006},
  pages     = {85-96},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{vishnu:hipc05,
  author    = {A. Vishnu and
               G. Santhanaraman and
               W. Huang and
               H.-W. Jin and
               D. K. Panda},
  title     = "{Supporting MPI-2 One Sided Communication on Multi-rail InfiniBand
               Clusters: Design Challenges and Performance Benefits}",
  booktitle = {International Conference on High Performance Computing},
  year      = {2005},
  pages     = {137-147},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{sur:hoti05,
  author    = {Sayantan Sur and
               Abhinav Vishnu and
               Hyun-Wook Jin and
               Wei Huang and
               Dhabaleswar K. Panda},
  title     = {Can Memory-Less Network Adapters Benefit Next-Generation
               InfiniBand Systems?.},
  booktitle = {Hot Interconnects},
  year      = {2005},
  pages     = {45-50},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{vishnu:smtps05,
  author    = "A. Vishnu and
               A. R. Mamidala and
               H.-W. Jin and
               D. K. Panda",
  title     = "{Performance Modeling of Subnet Management on Fat Tree InfiniBand
               Networks using OpenSM.}",
  booktitle = {Proceedings of First International Workshop on System
          Management Techniques, Processes, and Services, held in conjunction with        IPDPS'07},
  year      = {2005},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@article{liu:micro05,
  author    = {Jiuxing Liu and
               Amith R. Mamidala and
               Abhinav Vishnu and
               Dhabaleswar K. Panda},
  title     = {Evaluating InfiniBand Performance with PCI Express.},
  journal   = {IEEE Micro},
  volume    = {25},
  number    = {1},
  year      = {2005},
  pages     = {20-29},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{liu:sc04,
  author    = "J. Liu and
               A. Vishnu and
               D. K. Panda",
  title     = "{Building Multirail InfiniBand Clusters: MPI-Level Design
               and Performance Evaluation}",
  booktitle = {SuperComputing},
  year      = {2004},
  pages     = {33-44},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}
@inproceedings{chai:ccgrid07,
  author    = {Lei Chai and
               Qi Gao and
               Dhabaleswar K. Panda},
  title     = {Understanding the Impact of Multi-Core Architecture in Cluster
               Computing: A Case Study with Intel Dual-Core System.},
  booktitle = {CCGRID},
  year      = {2007},
  pages     = {471-478},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}


@inproceedings{koop:ccgrid07,
  author    = {Matthew J. Koop and
               Terry Jones and
               Dhabaleswar K. Panda},
  title     = {Reducing Connection Memory Requirements of MPI for InfiniBand
               Clusters: A Message Coalescing Approach.},
  booktitle = {CCGRID},
  year      = {2007},
  pages     = {495-504},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}


@inproceedings{chai:ccgrid06,
  author    = "L. Chai and
               R. Noronha and
               D. K. Panda",
  title     = "{MPI over uDAPL: Can High Performance and Portability Exist
               Across Architectures?.}",
  booktitle = {Cluster Computing and Grid},
  year      = {2006},
  pages     = {19-26},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{huang:ccgrid06,
  author    = "W. Huang and
               G. Santhanaraman and
               H.-W. Jin and
               Q. Gao and
               D. K. Panda",
  title     = "{Design of High Performance MVAPICH2: MPI2 over InfiniBand}",
  booktitle = {Cluster Computing and Grid},
  year      = {2006},
  pages     = {43-48},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{gao:icpp06,
  author    = {Qi Gao and
               Weikuan Yu and
               Wei Huang and
               Dhabaleswar K. Panda},
  title     = "{Application-Transparent Checkpoint/Restart for MPI Programs
               over InfiniBand}",
  booktitle = {International Conference on Parallel Processing},
  year      = {2006},
  pages     = {471-478}
}


@inproceedings{yu:ipdps06,
  author    = {Weikuan Yu and
               Qi Gao and
               Dhabaleswar K. Panda},
  title     = "{Adaptive Connection Management for Scalable MPI over InfiniBand}",
  booktitle = {IPDPS},
  year      = {2006},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{mamidala:ipdps06,
  author    = {Amith R. Mamidala and
               Lei Chai and
               Hyun-Wook Jin and
               Dhabaleswar K. Panda},
  title     = {Efficient SMP-aware MPI-level broadcast over InfiniBand's
               hardware multicast.},
  booktitle = {IPDPS},
  year      = {2006},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{sur:ipdps06-1,
  author    = {Sayantan Sur and
               Lei Chai and
               Hyun-Wook Jin and
               Dhabaleswar K. Panda},
  title     = {Shared receive queue based scalable MPI design for InfiniBand
               clusters.},
  booktitle = {IPDPS},
  year      = {2006},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{sur:ppopp06,
  author    = {Sayantan Sur and
               Hyun-Wook Jin and
               Lei Chai and
               Dhabaleswar K. Panda},
  title     = {RDMA read based rendezvous protocol for MPI over InfiniBand:
               design alternatives and benefits.},
  booktitle = {PPOPP},
  year      = {2006},
  pages     = {32-39},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{sur:sc06,
  author    = {Sayantan Sur and
               Matthew J. Koop and
               Dhabaleswar K. Panda},
  title     = {MPI and communication - High-performance and scalable MPI
               over InfiniBand with reduced memory usage: an in-depth performance
               analysis.},
  booktitle = {SC},
  year      = {2006},
  pages     = {105},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{yelick:europvm06,
  author    = {Katherine A. Yelick},
  title     = {Performance Advantages of Partitioned Global Address Space
               Languages.},
  booktitle = {PVM/MPI},
  year      = {2006},
  pages     = {6},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{bell:ipdps06,
  author    = {Christian Bell and
               Dan Bonachea and
               Rajesh Nishtala and
               Katherine A. Yelick},
  title     = {Optimizing bandwidth limited problems using one-sided communication
               and overlap.},
  booktitle = {IPDPS},
  year      = {2006},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{buntinas:ccgrid06,
  author    = {Darius Buntinas and
               Guillaume Mercier and
               William Gropp},
  title     = {Design and Evaluation of Nemesis, a Scalable, Low-Latency,
               Message-Passing Communication Subsystem.},
  booktitle = {CCGRID},
  year      = {2006},
  pages     = {521-530},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{sur:hipc05,
  author    = {Sayantan Sur and
               U. K. R. Bondhugula and
               Amith R. Mamidala and
               Hyun-Wook Jin and
               Dhabaleswar K. Panda},
  title     = {High Performance RDMA Based All-to-All Broadcast for InfiniBand
               Clusters.},
  booktitle = {HiPC},
  year      = {2005},
  pages     = {148-157},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{sivaram:hoti05,
  author    = {Rajeev Sivaram and
               Rama K. Govindaraju and
               Peter H. Hochschild and
               Robert Blackmore and
               Piyush Chaudhary},
  title     = "{Breaking the Connection: RDMA Deconstructed}",
  booktitle = {Hot Interconnects},
  year      = {2005},
  pages     = {36-42}
}

@inproceedings{sur:hoti05,
  author    = {Sayantan Sur and
               Abhinav Vishnu and
               Hyun-Wook Jin and
               Wei Huang and
               Dhabaleswar K. Panda},
  title     = {Can Memory-Less Network Adapters Benefit Next-Generation
               InfiniBand Systems?.},
  booktitle = {Hot Interconnects},
  year      = {2005},
  pages     = {45-50},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{jin:icpp05,
  author    = {Hyun-Wook Jin and
               Sayantan Sur and
               Lei Chai and
               Dhabaleswar K. Panda},
  title     = {LiMIC: Support for High-Performance MPI Intra-node Communication
               on Linux Cluster.},
  booktitle = {ICPP},
  year      = {2005},
  pages     = {184-191},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{huang:ipdps05,
  author    = "W. Huang and
               G. Santhanaraman and
               H.-W. Jin and
               D. K. Panda",
  title     = "{Scheduling of MPI-2 One Sided Operations over InfiniBand}",
  booktitle = {International Symposium on
          Parallel and Distributed Processing},
  year      = {2005},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{huang:europvm05,
  author    = {Wei Huang and
               Gopalakrishnan Santhanaraman and
               Hyun-Wook Jin and
               Dhabaleswar K. Panda},
  title     = {Design Alternatives and Performance Trade-Offs for Implementing
               MPI-2 over InfiniBand.},
  booktitle = {PVM/MPI},
  year      = {2005},
  pages     = {191-199},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{chai:europvm05,
  author    = "L. Chai and
               R. Noronha and
               P. Gupta and
               G. Brown and
               D. K. Panda",
  title     = "{Designing a Portable MPI-2 over Modern Interconnects Using
               uDAPL Interface}",
  booktitle = {EuroPVM/MPI},
  year      = {2005},
  pages     = {200-208},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}


@inproceedings{mamidala:europvm05,
  author    = {Amith R. Mamidala and
               Hyun-Wook Jin and
               Dhabaleswar K. Panda},
  title     = {Efficient Hardware Multicast Group Management for Multiple
               MPI Communicators over InfiniBand.},
  booktitle = {PVM/MPI},
  year      = {2005},
  pages     = {388-398},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@article{liss:tpds0905,
  author    = {Liran Liss and
               Yitzhak Birk and
               Assaf Schuster},
  title     = {In-Kernel Integration of Operating System and Infiniband
               Functions for High Performance Computing Clusters: A DSM
               Example.},
  journal   = {IEEE Trans. Parallel Distrib. Syst.},
  volume    = {16},
  number    = {9},
  year      = {2005},
  pages     = {830-840},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{chai:ipdps05,
  author    = {Lei Chai and
               Sayantan Sur and
               Hyun-Wook Jin and
               Dhabaleswar K. Panda},
  title     = {Analysis of Design Considerations for Optimizing Multi-Channel
               MPI over InfiniBand.},
  booktitle = {IPDPS},
  year      = {2005},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{govindaraju:hipc04,
  author    = {Rama K. Govindaraju and
               Peter H. Hochschild and
               Don G. Grice and
               Kevin J. Gildea and
               Robert Blackmore and
               Carl A. Bender and
               Chulho Kim and
               Piyush Chaudhary and
               Jason Goscinski and
               Jay Herring and
               Steven Martin and
               John Houston},
  title     = "{Architecture and Early Performance of the New IBM HPS Fabric
               and Adapter}",
  booktitle = {International Conference on High Performance Computing},
  year      = {2004},
  pages     = {156-165}
}

@inproceedings{yu:cluster04,
  author    = {Weikuan Yu and
               Dhabaleswar K. Panda and
               Darius Buntinas},
  title     = {Scalable, high-performance NIC-based all-to-all broadcast
               over Myrinet/GM.},
  booktitle = {CLUSTER},
  year      = {2004},
  pages     = {125-134},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{jiang:ccgrid04,
  author    = {Weihang Jiang and
               Jiuxing Liu and
               Hyun-Wook Jin and
               Dhabaleswar K. Panda and
               William Gropp and
               Rajeev Thakur},
  title     = {High performance MPI-2 one-sided communication over InfiniBand.},
  booktitle = {CCGRID},
  year      = {2004},
  pages     = {531-538},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}


@inproceedings{mamidala:cluster04,
  author    = "A. R. Mamidala and
               J. Liu and
               D. K. Panda",
  title     = "{Efficient Barrier and Allreduce on Infiniband Clusters using
               Multicast and Adaptive Algorithms}",
  booktitle = {Cluster},
  year      = {2004},
  pages     = {135-144},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}


@inproceedings{thakur:europvm04,
  author    = {Rajeev Thakur and
               William D. Gropp and
               Brian R. Toonen},
  title     = {Minimizing Synchronization Overhead in the Implementation
               of MPI One-Sided Communication.},
  booktitle = {PVM/MPI},
  year      = {2004},
  pages     = {57-67},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{yu:hipc04,
  author    = {Weikuan Yu and
               Jiesheng Wu and
               Dhabaleswar K. Panda},
  title     = "{Fast and Scalable Startup of MPI Programs in InfiniBand
               Clusters}",
  booktitle = {International Conference on High Performance Computing},
  year      = {2004},
  pages     = {440-449}
}


@inproceedings{sur:icpp04,
  author    = {Sayantan Sur and
               Hyun-Wook Jin and
               Dhabaleswar K. Panda},
  title     = {Efficient and Scalable All-to-All Personalized Exchange
               for InfiniBand-Based Clusters.},
  booktitle = {ICPP},
  year      = {2004},
  pages     = {275-282},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{liu:ipdps04,
  author    = {Jiuxing Liu and
               Weihang Jiang and
               Pete Wyckoff and
               Dhabaleswar K. Panda and
               David Ashton and
               Darius Buntinas and
               William D. Gropp and
               Brian R. Toonen},
  title     = {Design and Implementation of MPICH2 over InfiniBand with
               RDMA Support.},
  booktitle = {IPDPS},
  year      = {2004},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{yu:ipdps04,
  author    = {Weikuan Yu and
               Darius Buntinas and
               Richard L. Graham and
               Dhabaleswar K. Panda},
  title     = {Efficient and Scalable Barrier over Quadrics and Myrinet
               with a New NIC-Based Collective Message Passing Protocol.},
  booktitle = {IPDPS},
  year      = {2004},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{liu-m:ipdps04,
  author    = {Jiuxing Liu and
               Amith R. Mamidala and
               Dhabaleswar K. Panda},
  title     = {Fast and Scalable MPI-Level Broadcast Using InfiniBand?s
               Hardware Multicast Support.},
  booktitle = {IPDPS},
  year      = {2004},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{wu:ipdps04,
  author    = {Jiesheng Wu and
               Pete Wyckoff and
               Dhabaleswar K. Panda},
  title     = {High Performance Implementation of MPI Derived Datatype
               Communication over InfiniBand.},
  booktitle = {IPDPS},
  year      = {2004},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@article{yu:corr04,
  author    = {Weikuan Yu and
               Darius Buntinas and
               Richard L. Graham and
               Dhabaleswar K. Panda},
  title     = {Efficient and Scalable Barrier over Quadrics and Myrinet
               with a New NIC-Based Collective Message Passing Protocol},
  journal   = {CoRR},
  volume    = {cs.DC/0402027},
  year      = {2004},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}


@article{liu:micro04,
  author    = {Jiuxing Liu and
               B. Chandrasekaran and
               Weikuan Yu and
               Jiesheng Wu and
               Darius Buntinas and
               Sushmitha P. Kini and
               Dhabaleswar K. Panda and
               Pete Wyckoff},
  title     = {Microbenchmark Performance Comparison of High-Speed Cluster
               Interconnects.},
  journal   = {IEEE Micro},
  volume    = {24},
  number    = {1},
  year      = {2004},
  pages     = {42-51},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}


@inproceedings{noronha:europar05,
  author    = {Ranjit Noronha and
               Dhabaleswar K. Panda},
  title     = {Performance Evaluation of MM5 on Clusters with Modern Interconnects:
               Scalability and Impact.},
  booktitle = {Euro-Par},
  year      = {2005},
  pages     = {134-145},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@article{liu:ijpp04,
  author    = "J. Liu and
               J. Wu and
               D. K. Panda",
  title     = "{High Performance RDMA-Based MPI Implementation over InfiniBand}",
  journal   = {International Journal of Parallel Programming},
  volume    = {32},
  number    = {3},
  year      = {2004},
  pages     = {167-198},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{bala:tools03,
  author    = {B. Chandrasekaran and
               Pete Wyckoff and
               Dhabaleswar K. Panda},
  title     = {MIBA: A Micro-Benchmark Suite for Evaluating InfiniBand
               Architecture Implementations.},
  booktitle = {Computer Performance Evaluation / TOOLS},
  year      = {2003},
  pages     = {29-46},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{liu:ics03,
  author    = "J. Liu and
               J. Wu and
               S. P. Kini and
               P. Wyckoff and
               D. K. Panda",
  title     = "{High Performance RDMA-based MPI Implementation over InfiniBand}",
  booktitle = {International Conference on SuperComputing},
  year      = {2003},
  pages     = {295-304},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{kini:europvm03,
  author    = {Sushmitha P. Kini and
               Jiuxing Liu and
               Jiesheng Wu and
               Pete Wyckoff and
               Dhabaleswar K. Panda},
  title     = {Fast and Scalable Barrier Using RDMA and Multicast Mechanisms
               for InfiniBand-Based Clusters.},
  booktitle = {PVM/MPI},
  year      = {2003},
  pages     = {369-378},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@article{liu:corr03,
  author    = {Jiuxing Liu and
               Weihang Jiang and
               Pete Wyckoff and
               Dhabaleswar K. Panda and
               David Ashton and
               Darius Buntinas and
               William Gropp and
               Brian R. Toonen},
  title     = {Design and Implementation of MPICH2 over InfiniBand with
               RDMA Support},
  journal   = {CoRR},
  volume    = {cs.AR/0310059},
  year      = {2003},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}


@inproceedings{liu:sc03,
  author    = "J. Liu and
               B. Chandrasekaran and
               J. Wu and
               W. Jiang and
               S. P. Kini and
               W. Yu and
               D. Buntinas and
               P. Wyckoff and
               D. K. Panda",
  title     = "{Performance Comparison of MPI Implementations over InfiniBand,
               Myrinet and Quadrics.}",
  booktitle = {SuperComputing},
  year      = {2003},
  pages     = {58-69},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}


@article{banikazemi:tpds1201,
  author    = {Mohammad Banikazemi and
               Rama Govindaraju and
               Robert Blackmore and
               Dhabaleswar K. Panda},
  title     = "{MPI-LAPI: An Efficient Implementation of MPI for IBM RS/6000
               SP Systems.}",
  journal   = {IEEE Trans. Parallel Distrib. Syst.},
  volume    = {12},
  number    = {10},
  year      = {2001},
  pages     = {1081-1093},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}


@inproceedings{DBLP:conf/sc/TraffRH00,
  author    = {Jesper Larsson Tr{\"a}ff and
               Hubert Ritzdorf and
               Rolf Hempel},
  title     = {The Implementation of MPI-2 One-Sided Communication for
               the NEC SX-5.},
  booktitle = {SC},
  year      = {2000},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}


@inproceedings{shah:ipps98,
  author    = {Gautam Shah and
               Jarek Nieplocha and
               Jamshed H. Mirza and
               Chulho Kim and
               Robert J. Harrison and
               Rama Govindaraju and
               Kevin J. Gildea and
               Paul DiNicola and
               Carl A. Bender},
  title     = "{Performance and Experience with LAPI - a New High-Performance
               Communication Library for the IBM RS/6000 SP.}",
  booktitle = {IPPS/SPDP},
  year      = {1998},
  pages     = {260-266},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@article{lauria:jpdc97,
  author    = {Mario Lauria and
               Andrew A. Chien},
  title     = {MPI-FM: High Performance MPI on Workstation Clusters.},
  journal   = {J. Parallel Distrib. Comput.},
  volume    = {40},
  number    = {1},
  year      = {1997},
  pages     = {4-18},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}


@inproceedings{auwles:ipdps04,
  author    = {Rob T. Aulwes and
               David J. Daniel and
               Nehal N. Desai and
               Richard L. Graham and
               L. Dean Risinger and
               Mark A. Taylor and
               Timothy S. Woodall and
               Mitchel W. Sukalski},
  title     = {Architecture of LA-MPI, A Network-Fault-Tolerant MPI.},
  booktitle = {IPDPS},
  year      = {2004},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{aulwes:europvm03,
  author    = {Rob T. Aulwes and
               David J. Daniel and
               Nehal N. Desai and
               Richard L. Graham and
               L. Dean Risinger and
               Mitchel W. Sukalski and
               Mark A. Taylor},
  title     = {Network Fault Tolerance in LA-MPI.},
  booktitle = {PVM/MPI},
  year      = {2003},
  pages     = {344-351},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}
@inproceedings{gupta:ipdps03,
  author    = {Rinku Gupta and
               Pavan Balaji and
               Dhabaleswar K. Panda and
               Jarek Nieplocha},
  title     = {Efficient Collective Operations Using Remote Memory Operations
               on VIA-Based Clusters.},
  booktitle = {IPDPS},
  year      = {2003},
  pages     = {46},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{moody:sc03,
  author    = {Adam Moody and
               Juan Fern{\'a}ndez and
               Fabrizio Petrini and
               Dhabaleswar K. Panda},
  title     = {Scalable NIC-based Reduction on Large-scale Clusters.},
  booktitle = {SC},
  year      = {2003},
  pages     = {59},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}


@InProceedings{yuw:snapi05,
  author =	 "W. Yu and D. K. Panda,",
  title =	 "{Benefits of Quadrics Scatter/Gather to PVFS2
                  Noncontiguous I/O}",
  booktitle =	 "International Workshop on Storage Network
                  Architecture and Parallel I/Os (SNAPI)",
  year =	 2005
}

@InProceedings{balaji:pfldnet05,
  author =	 "V. Viswanath and P. Balaji and W. Feng and J. Leigh
                  and D. K. Panda",
  title =	 "{A Case for UDP Offload Engines in LambdaGrids}",
  booktitle =	 "International Workshop on Protocols for Fast
                  Long-Distance Networks (PFLDnet)",
  year =	 2005
}



@InProceedings{graham:lampi,
	author = "Richard L. Graham and Sung-Eun Choi and 
		David J. Daniel and Nehal N. Desai and Ronald G. Minnich 
			and Craig E. Rasmussen and L. Dean Risinger and 
Mitchel W. Sukalski",
	title = "{A Network-Failure-Tolerant Message-Passing System for Terascale Clusters}",
	journal = "{Int. J. Parallel Program.}",
	volume = {31},
	number = {4},
	year = {2003},
	issn = {0885-7458},
	pages = {285--303},
	doi = {http://dx.doi.org/10.1023/A:1024504726988},
	publisher = {Kluwer Academic Publishers},
	address = {Norwell, MA, USA},
}

@InProceedings{openmpi:europvm04,
	author    = "Edgar Gabriel and
		Graham E. Fagg and
			George Bosilca and
			Thara Angskun and
			Jack Dongarra and
			Jeffrey M. Squyres and
			Vishal Sahay and
			Prabhanjan Kambadur and
			Brian Barrett and
			Andrew Lumsdaine and
			Ralph H. Castain and
			David J. Daniel and
			Richard L. Graham and
			Timothy S. Woodall",
	title     = "{Open MPI: Goals, Concept, and Design of a Next Generation
		MPI Implementation.}",
	booktitle = "{EuroPVM/MPI}",
	year      = {2004},
	pages     = {97-104},
	bibsource = {DBLP, http://dblp.uni-trier.de}
}

@InProceedings{pakin:vmi,
	author      = "Scott Pakin and Avneesh Pant",
	title       = "{{VMI}~2.0: A Dynamically Reconfigurable Messaging Layer for Availability, Usability, and Management}",
	booktitle   = "{The 8th International Symposium on High Performance Computer Architecture (HPCA-8), Workshop on Novel Uses of System Area Networks (SAN-1)}",
	year        = 2002,
	address     = "{Cambridge, Massachusetts}",
	month       = feb # {~2,},
}

@article{mpi1,
	author =       "W. Gropp and E. Lusk and N. Doss and A. Skjellum",
	title =        "{A High-Performance, Portable Implementation of the
			{MPI} Message Passing Interface Standard}",
	journal =      "Parallel Computing",
	volume =       "22",
	number =       "6",
	pages =        "789--828",
	year =         "1996"
}

@InProceedings{mpi2,
	author = "Al Geist and William Gropp and Steve Huss-Lederman and Andrew Lumsdaine and Ewing L. Lusk and William Saphir and Tony Skjellum and Marc Snir",
	title = "{MPI}-2: Extending the Message-Passing Interface",
	booktitle = "Euro-Par, Vol. I",
	pages = "128-135",
	year = "1996"
}

@InProceedings{jiangw:ccgrid04,
	author = "W. Jiang and J. Liu and H.-W. Jin and D. K. Panda and W. Gropp and R. Thakur",
	title = "{High Performance MPI-2 One-Sided Communication over InfiniBand}",
	howpublished = "{International Symposium on Cluster Computing and the
		Grid (CCGrid 04)}",
	month = "April",
	year = "2004"
	}

@InProceedings{jiangw:europvm04,
    	author = "W. Jiang and J.Liu and  H. W. Jin and D. K. Panda and D.
		    Buntinas and R.Thakur and W.Gropp",
	title = "{Efficient Implementation of MPI-2 Passive One-Sided
			Communication on InfiniBand Clusters}",
	howpublished = "EuroPVM/MPI",
        month = "September",
	year = "2004"
}

@InProceedings{thakur:europvm04,
	author = "R. Thakur and W. Gropp and B. Toonen",
	title = "{Minimizing Synchronization Overhead in the Implementation of MPI One-Sided Communication}",
	booktitle ={EuroPVM/MPI},
	month = "September",
	year = "2004"
}

@InProceedings{bonachea:gasnet,
		author = "D. Bonachea",
		title = "{GASNet Specification, v1.1}",
		howpublished = "{Technical Report UCB/CSD-02-1207, Computer Science Division, University of California at Berkeley}",
		month = "October",
		year = "2002"
	}

@InProceedings{BSP,
	author  = "M. Goudreau and K. Lang and S. B. Rao and T. Suel and T. Tsantilas",
	title   = "{Portable and Effcient Parallel Computing Using the BSP Model}",
	journal = "{IEEE Transactions on Computers}",
	year    = 1999,
	pages   = "670-689"
}

@book{duato:book,
	author = "J. Duato and S. Yalamanchili and L. Ni",
	title  = "{Interconnection Networks: An Engineering Approach}",
	publisher = "The IEEE Computer Society Press",
	year   = "1997"
}


@InProceedings{NPB,
	author = "D. H. Bailey and E. Barszcz and J. T. Barton and D. S. Browning and R. L. Carter and D. Dagum and R. A. Fatoohi and P. O. Frederickson and T. A. Lasinski and R. S. Schreiber and H. D. Simon and V. Venkatakrishnan and S. K. Weeratunga",
	title = "{The NAS Parallel Benchmarks}",
	booktitle = "The International Journal of Supercomputer Applications",
	`volume = "5",
	number = "3",
	pages = "63--73",
	year = "1991",
	url = "citeseer.ist.psu.edu/bailey95nas.html" 
}

@article{MPILAPI,
	author  = "M. Banikazemi and R. K. Govindaraju and R. Blackmore and D. K. Panda ",
	title   = "{MPI-LAPI: An Efficient Implementation of MPI for IBM RS/6000 SP Systems}",
	journal = "{IEEE Transactions on Parallel and Distributed Systems}",
	year    = 2001,
	month   = "October",
	pages   = "1081-1093"
}

@misc{DAT,
    author = "{DAT Collaborative}",
    title = "{uDAPL: User Direct Access Programming Library Version 1.2}",
    howpublished = "{http://www.datcollaborative.org/udapl.html}",
    month = "July",
    year = "2004"
}

@misc{OPENIB,
	author = "{OpenFabrics Organization}",
	howpublished = "{http://www.openib.org/}",
}

@misc{MVICH, 
	author = "{Lawrence Livermore National Laboratory}",
	title = "{MVICH: MPI for Virtual Interface Architecture}",
	month ="August",
	year ="2001"
}

@inproceedings{hoefler-parsim-06,
  author = {T. Hoefler and P. Gottschling and W. Rehm and A. Lumsdaine},
  title = {{Optimizing a Conjugate Gradient Solver with Non-Blocking Collective Operations}},
  booktitle    = {Proceedings, 13th European PVM/MPI Users' Group Meeting},
  year      = 2006,
  address   = {Bonn, Germany},
  month     = {September},
  publisher = {Springer-Verlag},
  series = {Lecture Notes in Computer Science},
  source = {http://www.open-mpi.org/papers/},
}

@techreport{Hursey-Open-MPI-CRS,
  Address = {Bloomington, Indiana, USA},
  Author = {Joshua Hursey and Jeffrey M. Squyres and Andrew Lumsdaine },
  Institution = {Indiana University},
  Month = {July},
  Number = {TR635},
  Title = {A Checkpoint and Restart Service Specification for Open MPI},
  Year = {2006}
}

/* The citation is not complete */
@inproceedings{carlos-sc-06,
 author = {Jose Carlos Sancho Pitarch and Kevin J. Barker and Darren J. Kerbyson and Kei Davis },
 title = {{Quantifying the Potential Benefit of Overlapping Communication and Computation in Large-Scale Scientific Applications}},
}

@inproceedings{coll:cluster01,
  author = 	 "S. Coll and E. Frachtenberg and F. Petrini and A. Hoisie and L. Gurvits",
  title = 	 "{Using Multirail Networks in High-Performance Clusters}",
  booktitle = 	 {Cluster},
  year =	 {2001},
  pages = {16--24},
  url = citeseer.ist.psu.edu/coll01using.html 
}

@inproceedings{angskun:dapsys06,
  author = {Thara Angskun and Graham E. Fagg and George Bosilca and Jelena Pjesivac-Grbovic and Jack J. Dongarra},
  title = "{Self-Healing Network for Scalable Fault Tolerant Runtime Environments}",
  booktitle = {Proceedings of 6th Austrian-Hungarian workshop on distributed and parallel systems},
  address = {Innsbruck, Austria},
  publisher = {Springer-Verlag},
  month = {September},
  year = {2006},
}


@inproceedings{lampi:ipdps04,
  author    = {Rob T. Aulwes and
               David J. Daniel and
               Nehal N. Desai and
               Richard L. Graham and
               L. Dean Risinger and
               Mark A. Taylor and
               Timothy S. Woodall and
               Mitchel W. Sukalski},
  title     = "{Architecture of LA-MPI, A Network-Fault-Tolerant MPI.}",
  booktitle = {IPDPS},
  year      = {2004},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@article{petrini:micro05,
 author = {F. Petrini and W. Feng and A. Hoisie and S. Coll and E. Frachtenberg},
 title = "{The Quadrics Network: High-Performance Clustering Technology}",
 journal = {IEEE Micro},
 volume = {22},
 number = {1},
 year = {2002},
 issn = {0272-1732},
 pages = {46--57},
 doi = {http://dx.doi.org/10.1109/40.988689},
 publisher = {IEEE Computer Society Press}
 }

@inproceedings{geoffray:hpcasia04,
 author = {Patrick Geoffray},
 title = "{Myrinet eXpress (MX): Is Your Interconnect Smart?}",
 booktitle = {HPCASIA '04: Proceedings of the High Performance Computing and Grid in Asia Pacific Region, Seventh International Conference on (HPCAsia'04)},
 year = {2004},
 isbn = {0-7695-2138-X},
 pages = {452--452},
 publisher = {IEEE Computer Society},
 address = {Washington, DC, USA}
}

@misc{IMB,
  title =        "{Intel MPI Benchmark}",
  howpublished = " http://www.intel.com/cd/software/products/"
}                 

@misc{quadrics,  
  title =        "{Quadrics Supercomputers World Ltd.}",
  howpublished = "http://www.quadrics.com/"
}

@Misc{ammasso,
  author =       {Ammasso Incorporation},
  howpublished =
                  {http://\linebreak[0]www.\linebreak[0]ammasso.\linebreak[0]com/}
}

@manual{MPI,      
  organization = "Message Passing Interface Forum",
  title =        "MPI: A Message-Passing Interface Standard",
  month =        "Mar",
  year =         "1994"
}
  
@misc{kernel,
  title =        "{The Linux Kernel Archives}",
  howpublished = "http://www.kernel.org/"
}

@article{boden:micro95,
	author = "{N.J. Boden, D. Cohen, R.E. Felderman, A.E. Kulawik, C.L. Seitz, J.N. Seizovic, and W. Su}",
	title = "{Myrinet: A Gigabit-per-second Local Area Network}",
	journal = "{IEEE Micro}",
	volume = "15",
	number = "1",
	month = "February",
	year  = "1995",
	pages = "29-36"
}

@InProceedings{eicken:isca92,
        author  = "T. von Eicken and D. E. Culler and S. C. Goldstein and K. E. Schauser",                                                                                        title   = "{Active Messages: A Mechanism for Integrated Communication and Computation}",
        booktitle = "International Symposium on Computer Architecture",
        year    = 1992,
        pages   = "256-266"
}

@InProceedings{pakin:sc95,
        author  = "S. Pakin and M. Lauria and A. Chien",                                     title   = "{High Performance Messaging on Workstations: Illinois Fast Messages (FM)}",  
        booktitle = "Proceedings of the Supercomputing",
        year    = 1995                                                               
}



@inproceedings{blumrich:micro95,
		author = "M. Blumrich and C. Dubnicki and E. W. Felten and K. Li and M.      R. Mesarina",                                                                                title = "{Virtual-Memory-Mapped Network Interfaces}",                                booktitle = "{IEEE Micro}",
		pages = "21-28",                                                                     month = "Feb.",
		year = "1995"
}

@Article{MPISHMEM, 
        author = "W. Gropp and E. Lusk",                                                       title = "{A High-Performance                                                           MPI Implementation on a Shared-Memory Vector Supercomputer}",
        journal = "Parallel Computing", 
        volume = "22", 
        number = "11",
        pages = "1513--1526",
        month = jan,
        year = "1997", }   

@InProceedings{MPISTART,
        author  = "P. Husbands and J. C. Hoe",                                                 title   = "{MPI-StarT: Delivering Network Performance to Numerical Applications}",  
        booktitle = "Proceedings of the Supercomputing", 
        year    = 1998
}

@inproceedings{striping_protocol,
    author = "H. Adiseshu and G. M. Parulkar and G. Varghese",
    title = "{A Reliable and Scalable Striping Protocol}",
    booktitle = "{SIGCOMM}",
    pages = "131-141",
    year = "1996",
    url = "citeseer.ist.psu.edu/adiseshu96reliable.html" 
}

@article{via_dunning98,
        author  = "D. Dunning and G. Regnier and G. McAlpine and D. Cameron and
B. Shubert and F. Berry and A.M. Merritt and E. Gronke and C. Dodd",
        title   = "{The Virtual Interface Architecture}",
        journal = "{IEEE Micro}",
        year    = 1998,
        month   = "March/April",
        pages   = "66-76"
}

@misc{VIA-SPEC,
        author = "Compaq and Intel and Microsoft",
        title = "{VI Architecture Specification V1.0}",
        month ="December",
        year ="1997"
}       

@InProceedings{MB_VIA_IPDPS_2000,
    author  =  "M. Banikazemi and V. Moorthy and L. Herger and D. K. Panda and B. Abali",    
    title  =  "{Efficient Virtual Interface Architecture Support for the IBM SP Switch-Connected NT Clusters}",
    booktitle = "{Int'l Parallel and Distributed Processing Symposium (IPDPS '00)}",
        month  =  "May",
        year  =  "2000",
        pages  =  "33--42"
}          
      
@Article{gropp:96, author = "W. Gropp and E. Lusk and N. Doss and A. Skjellum", title = "A high-performance, portable implementation of the {MPI} message passing interface standard", journal = "Parallel Computing", volume = "22", number = "6", pages = "789--828", month = sep, year = "1996" }  
@inproceedings{koop:ccgrid07,
	author = {M. Koop and T. Jones and D. K. Panda},
	title = "{Reducing Connection Memory Requirements of MPI for InfiniBand
		Clusters: A Message Coalescing Approach}",
year = 2007,
month = "May",
booktitle = {Proceedings of Int'l Symposium on Cluster Computing and the
	Grid (CCGrid)}
}


@inproceedings{vaidyana:cac07,
	author = {K. Vaidyanathan and W. Huang and L. Chai and D. K. Panda},
	title = "{Designing Efficient Asynchronous Memory Operations Using Hardware
		Copy Engine: A Case Study with I/OAT}",
year = 2007,
month = "March",
booktitle = {International Workshop on Communication Architecture for
	Clusters, held in conjunction with IPDPS '07}
}

@article{petrini:jcc03,
  author = 	 {Fabrizio Petrini and Eitan Frachtenberg and Adolfy Hoisie and Salvador Coll}, 
  title = 	 "{Performance Evaluation of the Quadrics Interconnection Network}",
  journal = 	"{Journal of Cluster Computing}",
  volume = 	 6,
  number =       2,
  pages = {125--142},
  month = {April},
  year =	 {2003},
}


@inproceedings{sanjay:wsc01,
 author = {Sanjay Shakkottai and R. Srikant},
 title = {Deterministic fluid models of congestion control in high-speed networks},
 booktitle = {WSC '01: Proceedings of the 33nd conference on Winter simulation},
 year = {2001},
 isbn = {0-7803-7309-X},
 pages = {1275--1281},
 location = {Arlington, Virginia},
 publisher = {IEEE Computer Society},
 }

@article{floyd:atn93,
    author = "S. Floyd and V. Jacobson",
    title = "{Random Early Detection Gateways for Congestion Avoidance}",
    journal = "IEEE\slash ACM Transactions on Networking",
    volume = "1",
    number = "4",
    pages = "397--413",
    year = "1993",
    url = "citeseer.ist.psu.edu/floyd93random.html" }

@article{wang:globecom99,
  author = "H. Wang and K. Shin",
  title = "{Refined Design of Random Early Detection Gateways}",
  journal = "Proceedings of IEEE GLOBECOM",
  year = "1999",
  url = "citeseer.ist.psu.edu/wang99refined.html" }

@inproceedings{qian:cac06,
  author = {Ying Qian and Ahmad Afsahi},
  title = "{Efficient RDMA-based Multi-Port Collectives on Multi-Rail QsNet Clusters}",
  booktitle = {Workshop on Communication Architecture for Clusters, IPDPS},
  year = "2006"
}

@inproceedings{sistare:sc02,
 author = {Steven J. Sistare and Christopher J. Jackson},
 title = {Ultra-high performance communication with MPI and the Sun fire link interconnect},
 booktitle = {Supercomputing '02: Proceedings of the 2002 ACM/IEEE conference on Supercomputing},
 year = {2002},
 pages = {1--15},
 location = {Baltimore, Maryland}
 }


@inproceedings{gropp:europvm07,
		author    = {William D. Gropp and
				Rajeev Thakur},
		title     = {Revealing the Performance of MPI RMA Implementations},
		booktitle = {PVM/MPI},
		year      = {2007},
		pages     = {272-280},
		ee        = {http://dx.doi.org/10.1007/978-3-540-75416-9_38},
		bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{shipman:europvm07,
		author    = {Galen M. Shipman and
				Ron Brightwell and
						Brian Barrett and
						Jeffrey M. Squyres and
						Gil Bloch},
		title     = {Investigations on InfiniBand: Efficient Network Buffer Utilization
				at Scale},
		booktitle = {PVM/MPI},
		year      = {2007},
		pages     = {178-186},
		ee        = {http://dx.doi.org/10.1007/978-3-540-75416-9_28},
		bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{barrett:europvm07,
		author    = {Brian Barrett and
				Galen M. Shipman and
						Andrew Lumsdaine},
		title     = {Analysis of Implementation Options for MPI-2 One-Sided},
		booktitle = {PVM/MPI},
		year      = {2007},
		pages     = {242-250},
		ee        = {http://dx.doi.org/10.1007/978-3-540-75416-9_35},
		crossref  = {DBLP:conf/pvm/2007},
		bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{brunner00scalable,
		author = "R. K. Brunner and J. C. Phillips and L. V. Kale",
		title = "{Scalable Molecular Dynamics for Large Biomolecular Systems}",
		pages = "67--85",
		booktitle = "SuperComputing (SC'2000)",	
		year = "2000"
}

@inproceedings{patterson:podc95,
		author    = "D. A. Patterson and
				D. E. Culler and
						T. E. Anderson",
		title     = "{A Case for NOW (Networks of Workstations)}",
		booktitle = {Principles of Distributed Computing},
		year      = {1995},
		pages     = {17-28}
}

@inproceedings{stewart:europvm07,
		author    = "L. C. Stewart and
				D. Gingold and
						J. Leonard and
						P. Watkins",
		title     = "{RDMA in the SiCortex Cluster Systems}",
		booktitle = {EuroPVM/MPI},
		year      = {2007},
		pages     = {260-271}
}

@inproceedings{kay:sigcomm93,
		author = "J. Kay and J. Pasquale",
		title = "{The Importance of Non-Data Touching Processing Overheads in {TCP}/{IP}}",
		booktitle = "{SIGCOMM}",
		pages = "259-268",
		year = "1993"
}

@article{hari:tcs99,
		author = "A. Hari and G. Varghese and G. Parulkar",
		title = "{An Architecture for Packet-Striping Protocols}",
		Journal = {ACM Transactions on Computer Systems},
		volume = {17},
		number = {4},
		year = {1999},
		pages = {249--287}
}

@inproceedings{tezuka:ipps98,
		author    = "H. Tezuka and
				F. O'Carroll and
						A. Hori and
						Y. Ishikawa",
		title     = "{Pin-Down Cache: A Virtual Memory Management Technique for
				Zero-Copy Communication}",
		booktitle = {IPPS/SPDP},
		year      = {1998},
		pages     = {308-314},
}

@article{nieplocha:psw94,
		author = {Nieplocha, Jaroslaw and Harrison, Robert J. and Littlefield, Richard J.},
		title = "{Global Arrays: A Nonuniform Memory Access Programming Model for High-Performance Computers}",
		journal = {Journal of Supercomputing},
		volume = {10},
		number = {2},
		year = {1996},
		issn = {0920-8542},
		pages = {169--189},
}


@article{nwchem,
		author = {Kendall, Ricky  A.  and Apr\`{a}, Edoardo   and Bernholdt, David  E.  and Bylaska, Eric  J.  and Dupuis, Michel   and Fann, George  I.  and Harrison, Robert  J.  and Ju, Jialin   and Nichols, Jeffrey  A.  and Nieplocha, Jarek   and Straatsma, T. P.  and Windus, Theresa  L.  and Wong, Adrian  T. },
		journal = {Computer Physics Communications},
		month = {June},
		number = {1-2},
		pages = {260--283},
		title = "{High Performance Computational Chemistry: An Overview of NWChem, A Distributed Parallel Application}",
		volume = {128},
		year = {2000},
}

@inproceedings{armci,
	author = {Jarek Nieplocha and Bryan Carpenter},
	title = "{ARMCI: A Portable Remote Memory Copy Library for Distributed Array Libraries and Compiler Run-Time Systems}",
	booktitle = {Lecture Notes in Computer Science},
	year = {1999},
	pages = {533--546},
	publisher = {Springer-Verlag}
}

@inproceedings{lakamraju:dsn03,
  author    = {Vijay Lakamraju and
               Israel Koren and
               C. Mani Krishna},
  title     = "{Low Overhead Fault Tolerant Networking in Myrinet}",
  booktitle = {Dependable Systems and Networks},
  year      = {2003},
  pages     = {193-202}
}

@inproceedings{wu:cluster02,
		author    = {Jiesheng Wu and
				Jiuxing Liu and
						Pete Wyckoff and
						Dhabaleswar K. Panda},
		title     = {Impact of On-Demand Connection Management in MPI over VIA},
		booktitle = {CLUSTER},
		year      = {2002},
		pages     = {152-159},
		ee        = {http://csdl.computer.org/comp/proceedings/cluster/2002/1745/00/17450152abs.htm},
		crossref  = {DBLP:conf/cluster/2002},
		bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{koop:ics07,
  author =	 {Matthew J. Koop and Sayantan Sur and Qi Gao and
                  Dhabaleswar K. Panda},
  title =	 {High performance MPI design using unreliable
                  datagram for ultra-scale InfiniBand clusters},
  booktitle =	 {ICS},
  year =	 2007,
  pages =	 {180-189},
  ee =		 {http://doi.acm.org/10.1145/1274971.1274997},
  bibsource =	 {DBLP, http://dblp.uni-trier.de}
}


@inproceedings{koop:cluster07-1,
		author    = {Matthew J. Koop and
				Sayantan Sur and
						Dhabaleswar K. Panda},
		title     = {Zero-copy protocol for MPI using infiniband unreliable datagram},
		booktitle = {CLUSTER},
		year      = {2007},
		pages     = {179-186},
		ee        = {http://dx.doi.org/10.1109/CLUSTR.2007.4629230},
		bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{koop:ipdps08,
		author    = {Matthew J. Koop and
				Terry Jones and
						Dhabaleswar K. Panda},
		title     = {MVAPICH-Aptus: Scalable high-performance multi-transport
				MPI over InfiniBand},
		booktitle = {IPDPS},
		year      = {2008},
		pages     = {1-12},
		ee        = {http://dx.doi.org/10.1109/IPDPS.2008.4536283},
		bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{koop:cluster08-1,
		author    = {Matthew J. Koop and
				Jaidev K. Sridhar and
						Dhabaleswar K. Panda},
		title     = {Scalable MPI design over InfiniBand using eXtended Reliable
				Connection},
		booktitle = {CLUSTER},
		year      = {2008},
		pages     = {203-212},
		ee        = {http://dx.doi.org/10.1109/CLUSTR.2008.4663773},
		crossref  = {DBLP:conf/cluster/2008},
		bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{edo:sc09,
		author = {Apr\`{a}, Edoardo and Rendell, Alistair P. and Harrison, Robert J. and Tipparaju, Vinod and deJong, Wibe A. and Xantheas, Sotiris S.},
		title = {Liquid water: obtaining the right answer for the right reasons},
		booktitle = {SC '09: Proceedings of the Conference on High Performance Computing Networking, Storage and Analysis},
		year = {2009},
		pages = {1--7},
}

@inproceedings{vishnu:ccpe,
    author = "{A. Vishnu, M. Koop, A. Moody, A. Mamidala, S. Narravula,
                and D. K. Panda}",
    title = "{Topology Agnostic Hot-Spot Avoidance with InfiniBand}",
    booktitle = "{Concurrency and Computation: Practice and Experience, Special
                    Issue of Best Papers from CCGrid '07}",
    year = {2008}
}

@inproceedings{blocksome:sc06,
		author    = {Michael Blocksome and
				Charles Archer and
						Todd Inglett and
						Patrick McCarthy and
						Michael Mundy and
						Joe Ratterman and
						A. Sidelnik and
						Brian E. Smith and
						George Alm{\'a}si and
						Jos{\'e} G. Casta{\~n}os and
						Derek Lieber and
						Jos{\'e} E. Moreira and
						Sriram Krishnamoorthy and
						Vinod Tipparaju and
						Jarek Nieplocha},
		title     = {Blue Gene system software - Design and implementation of
				a one-sided communication interface for the IBM eServer
					Blue Gene{\`e}},
		booktitle = {SuperComputing},
		year      = {2006},
		pages     = {120 -128},
		bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{tipparaju:sc05,
		author    = {Vinod Tipparaju and
				Jarek Nieplocha},
		title     = "{Optimizing All-to-All Collective Communication by Exploiting
				Concurrency in Modern Networks}",
		booktitle = {SuperComputing},
		year      = {2005},
		pages     = {4654},
}


@inproceedings{upc,
		author    = {Parry Husbands and
				Costin Iancu and
						Katherine A. Yelick},
		title     = "{A Performance Analysis of the Berkeley UPC Compiler}",
		booktitle = {International Conference on Supercomputing},
		year      = {2003},
		pages     = {63-73}
}


@inproceedings{x10,
		author = {Philippe Charles and Christian Grothoff and Vijay Saraswat and Christopher Donawa and Allan Kielstra and Kemal Ebcioglu and Christoph von Praun and Vivek Sarkar},
		booktitle = {OOPSLA '05: Proceedings of the 20th annual ACM SIGPLAN conference on Object-oriented programming, systems, languages, and applications},
		pages = {519--538},
		publisher = {ACM},
		title = "{X10: An Object-Oriented Approach to Non-Uniform Cluster Computing}",
		year = 2005
}

@article{geist:ijhpca09,
		author = {Geist, Al and Lucas, Robert},
		title = "{Major Computer Science Challenges At Exascale}",
		journal = {International Journal on High Performance Computing Applications},
		volume = {23},
		number = {4},
		year = {2009},
		issn = {1094-3420},
		pages = {427--436}
}

@inproceedings{exascale:scidac_software,
		booktitle = {SciDAC Review},
		title = "{Software Challenges at Extreme Scale}",
		year = 2009
}

@inproceedings{exascale:darpa_software,
		booktitle = {DARPA Review},
		title = "{ExaScale Software Study: Software Challenges in Extreme Scale Systems
}",
		year = 2009
}


@techreport{yelick:13dwarfs,
		Author = {Asanovic, Krste and Bodik, Ras and Catanzaro, Bryan Christopher and Gebis, Joseph James and Husbands, Parry and Keutzer, Kurt and Patterson, David A. and Plishker, William Lester and Shalf, John and Williams, Samuel Webb and Yelick, Katherine A.},
		Title = "{The Landscape of Parallel Computing Research: A View from Berkeley}",
		Institution = {EECS Department, University of California, Berkeley},
		Year = {2006},
		Number = {UCB/EECS-2006-183}
}

@article{bal:computers98,
		author = {Bhoedjang, Raoul A. F. and R\"{u}hl, Tim and Bal, Henri E.},
		title = "{User-Level Network Interface Protocols}",
		journal = {IEEE Transactions on Computers},
		volume = {31},
		number = {11},
		year = {1998},
		issn = {0018-9162},
		pages = {53--60}
}

@article{chapel,
		author = {Chamberlain, B.L. and Callahan, D. and Zima, H.P.},
		title = "{Parallel Programmability and the Chapel Language}",
		journal = {International Journal on High Performance Computing Applications},
		volume = {21},
		number = {3},
		year = {2007},
		issn = {1094-3420},
		pages = {291--312},
}

@inproceedings{shmem,
		author    = {Ron Brightwell},
		title     = "{A New MPI Implementation for Cray SHMEM}",
		booktitle = {EuroPVM/MPI},
		year      = {2004},
		pages     = {122-130}
}

@article{gasnet,
		author = {Bonachea, Dan and Duell, Jason},
		title = "{Problems with using MPI 1.1 and 2.0 as Compilation Targets for Parallel Language Implementations}",
		journal = {International Journal on High Performance Computing Applications},
		volume = {1},
		number = {1-3},
		year = {2004},
		issn = {1740-0562},
		pages = {91--99}
}

@inproceedings{sameer:ics08,
		author = {Kumar, Sameer and Dozsa, Gabor and Almasi, Gheorghe and Heidelberger, Philip and Chen, Dong and Giampapa, Mark E. and Blocksome, Michael and Faraj, Ahmad and Parker, Jeff and Ratterman, Joseph and Smith, Brian and Archer, Charles J.},
		title = "{The Deep Computing Messaging Framework: Generalized Scalable Message Passing on the Blue Gene/P Supercomputer}",
		booktitle = {ICS '08: Proceedings of the 22nd annual international conference on Supercomputing},
		year = {2008},
		isbn = {978-1-60558-158-3},
		pages = {94--103}
}

@inproceedings{varma:ics06,
		author = {Varma, Jyothish and Wang, Chao and Mueller, Frank and Engelmann, Christian and Scott, Stephen L.},
		title = "{Scalable, Fault Tolerant Membership for MPI tasks on HPC Systems}",
		booktitle = {ICS '06: Proceedings of the 20th annual international conference on Supercomputing},
		year = {2006},
		pages = {219--228}
}

@inproceedings{cifts,
		author = {Gupta, Rinku and Beckman, Pete and Park, Byung-Hoon and Lusk, Ewing and Hargrove, Paul and Geist, Al and Panda, Dhabaleswar and Lumsdaine, Andrew and Dongarra, Jack},
		title = "{CIFTS: A Coordinated Infrastructure for Fault-Tolerant Systems}",
		booktitle = {ICPP '09: Proceedings of the 2009 International Conference on Parallel Processing},
		year = {2009},
		pages = {237--245}
}

@inproceedings{mpichv2,
		author = {Bouteiller, Aur\'{e}lien and Cappello, Franck and Herault, Thomas and Krawezik, G\'{e}raud and Lemarinier, Pierre and Magniette, Fr\'{e}d\'{e}ric},
		title = {MPICH-V2: a Fault Tolerant MPI for Volatile Nodes based on Pessimistic Sender Based Message Logging},
		booktitle = {SC '03: Proceedings of the 2003 ACM/IEEE conference on Supercomputing},
		year = {2003},
		isbn = {1-58113-695-1},
		pages = {25}
}

@inproceedings{mpichv,
		author = {Bosilca, George and Bouteiller, Aurelien and Cappello, Franck and Djilali, Samir and Fedak, Gilles and Germain, Cecile and Herault, Thomas and Lemarinier, Pierre and Lodygensky, Oleg and Magniette, Frederic and Neri, Vincent and Selikhov, Anton},
		title = {MPICH-V: toward a scalable fault tolerant MPI for volatile nodes},
		booktitle = {Supercomputing '02: Proceedings of the 2002 ACM/IEEE conference on Supercomputing},
		year = {2002},
		pages = {1--18}
}

@inproceedings{villa:cf09,
		 author = {Villa, Oreste and Krishnamoorthy, Sriram and Nieplocha, Jarek and Brown,Jr., David M.},
		  title = {Scalable transparent checkpoint-restart of global address space applications on virtual machines over infiniband},
		   booktitle = {CF '09: Proceedings of the 6th ACM conference on Computing frontiers},
		    year = {2009},
			 isbn = {978-1-60558-413-3},
			  pages = {197--206},
			   location = {Ischia, Italy}
				   }

@inproceedings{liu:usenix06,
		author = {Liu, Jiuxing and Huang, Wei and Abali, Bulent and Panda, Dhabaleswar K.},
		title = {High performance VMM-bypass I/O in virtual machines},
		booktitle = {ATEC '06: Proceedings of the annual conference on USENIX '06 Annual Technical Conference},
		year = {2006},
		pages = {3--3},
		location = {Boston, MA},
		publisher = {USENIX Association}
}


@inproceedings{ftmpi,
		author = {Fagg, Graham E. and Dongarra, Jack},
		title = {FT-MPI: Fault Tolerant MPI, Supporting Dynamic Applications in a Dynamic World},
		booktitle = {Proceedings of the 7th European PVM/MPI Users' Group Meeting on Recent Advances in Parallel Virtual Machine and Message Passing Interface},
		year = {2000},
		isbn = {3-540-41010-4},
		pages = {346--353},
		address = {London, UK},
}

@article{gropp:ijhpca02,
		author = {Gropp, William and Lusk, Ewing},
		title = "{Fault Tolerance in Message Passing Interface Programs}",
		journal = {International Journal on High Performance Computing Applications},
		volume = {18},
		number = {3},
		year = {2004},
		issn = {1094-3420},
		pages = {363--372}
}

@inproceedings{vishnu:hipc10,
		author = {Vishnu, Abhinav and Van Dam, Hubertus and De Jong, Wibe and Balaji, Pavan and Song, Shuaiwen},
		title = "{Fault Tolerant Communication Runtime Support for Data Centric Programming Models}",
		booktitle = {International Conference on High Performance Computing},
		year = {2010}
}


@inproceedings{apra:sc09,
		author    = {Edoardo Apr{\`a} and
				Alistair P. Rendell and
						Robert J. Harrison and
						Vinod Tipparaju and
						Wibe A. deJong and
						Sotiris S. Xantheas},
		title     = "{Liquid Water: Obtaining The Right Answer For The Right Reasons}",
		booktitle = {SuperComputing},
		year      = {2009}
}


@inproceedings{moody:sc10,
		author = {Moody, Adam and Bronevetsky, Greg and Mohror, Kathryn and Supinski, Bronis},
		title = "{Design, Modeling, and Evaluation of a Scalable Multi-level Checkpointing System}",
		booktitle = {SuperComputing},
		year = {2010}
}

@inproceedings{donfack:ipdps10,
		author = {S. Donfack, L. Grigori, and A. Kumar Gupta},
		title = "{Adapting communication-avoiding LU and QR factorizations to multicore architectures}",
			  booktitle = {IPDPS},
		year = {2010}
}

@article{scalablast,
		author = {Christopher Oehmen and Jarek Nieplocha},
		title = {ScalaBLAST: A Scalable Implementation of BLAST for High-Performance Data-Intensive Bioinformatics Analysis},
		journal ={IEEE Transactions on Parallel and Distributed Systems},
		volume = {17},
		issn = {1045-9219},
		year = {2006},
		pages = {740-749},
		publisher = {IEEE Computer Society},
}

@inproceedings{magma,
		author =	{Agullo, E., Demmel, J., Dongarra, J., Hadri, B.,
				Kurzak, J., Langou, J., Ltaief, H., Luszczek, P., Tomov,
				S.},
		title =	{Numerical linear algebra on emerging architectures: The
				PLASMA and MAGMA projects},
		institution =	{Innovative Computing Laboratory, University of
				Tennessee},
		journal = {Journal of Physics: Conference Series},
		volume = {Vol. 180},
}


@inproceedings{dinan:ipdps07,
		author    = {James Dinan and
				Stephen Olivier and
						Gerald Sabin and
						Jan
						Prins
						and
						P.
						Sadayappan
						and
						Chau-Wen
						Tseng},
		title     = {Dynamic Load Balancing of Unbalanced
				Computations Using
						Message Passing},
		booktitle = {IPDPS},
		year      = {2007},
		pages     = {1-8},
}


@inproceedings{dinan:ccgrid10,
		author    = {James Dinan and
				Arjun Singri and
						P. Sadayappan
						and
						Sriram
						Krishnamoorthy},
		title     = {Selective Recovery from Failures in a Task
				Parallel Programming
						Model},
		booktitle = {CCGRID},
		year      = {2010},
		pages     = {709-714},
}


@inproceedings{dinan:icpp08,
		author    = {James Dinan and
				Sriram Krishnamoorthy and
						D. Brian Larkins
						and
						Jarek
						Nieplocha
						and
						P.
						Sadayappan},
		title     = {Scioto: A Framework for Global-View Task
				Parallelism},
		booktitle = {ICPP},
		year      = {2008},
		pages     = {586-593},
}

@INPROCEEDINGS{alverson:hoti10, 
		author={Alverson, R. and Roweth, D. and Kaplan, L.}, 
		booktitle={High Performance Interconnects (HOTI), 2010 IEEE 18th Annual Symposium on}, title={The Gemini System Interconnect}, 
		year={2010}, 
		month={aug.}, 
		volume={}, 
		number={}, 
		pages={83 -87}, 
		keywords={Crays supercomputer system;Gemini system interconnect;OS bypass;atomic memory operations;direct user completion notification;operating system;mainframes;multiprocessor interconnection networks;network computers;parallel machines;}, 
		doi={10.1109/HOTI.2010.23}, 
		ISSN={},}


@article{caf,
 author = {Numrich, Robert W. and Reid, John},
 title = {Co-array Fortran for parallel programming},
 journal = {SIGPLAN Fortran Forum},
 volume = {17},
 issue = {2},
 month = {August},
 year = {1998},
 issn = {1061-7264},
 pages = {1--31},
 numpages = {31},
 acmid = {289920},
 publisher = {ACM},
} 


@misc{hopper,
  title =        "{NERSC Hopper Phase II System}",
  howpublished = "http://www.nersc.gov/users/computational-systems/hopper"
} 

@misc{heidelberger:hoti11,
  title =        "{The IBM Blue Gene/Q Interconnection Network and Message Unit}",
  howpublished = "http://www.hoti.org/hoti19/keynotes/"
} 

  @article{dmapp,
		author = {Bruggencate, M and Roweth, D},
		journal={Cray Users Group (CUG)}, 
		title = "{DMAPP: An API for One-Sided Programming Model on Baker Systems}",
		year={2010}, 
		month={aug.}, 
		volume={}
} 


@inproceedings{vishnu:hoti11,
		author = {Vishnu, Abhinav and ten Bruggencate, Monika and Olson, Ryan},
		title = {Evaluating the Potential of Cray Gemini Interconnect for PGAS Communication Runtime Systems},
		booktitle = {Proceedings of the 2011 IEEE 19th Annual Symposium on High Performance Interconnects},
		year = {2011},
		isbn = {978-0-7695-4537-0},
		pages = {70--77},
		numpages = {8},
} 

@article{gao:computer00,
		author = {Guang R. Gao and Vivek Sarkar},
		title = {Location Consistency-A New Memory Model and Cache Consistency Protocol},
		journal ={IEEE Transactions on Computers},
		volume = {49},
		issn = {0018-9340},
		year = {2000},
		pages = {798-813}
}


@misc{bgq-wikipedia,
		title =        "{Blue Gene/Q Architecture}",
		howpublished = "http://en.wikipedia.org/wiki/BlueGene"
}

@ARTICLE{haring:micro12, 
		author={Haring, R.A. and Ohmacht, M. and Fox, T.W. and Gschwind, M.K. and Satterfield, D.L. and Sugavanam, K. and Coteus, P.W. and Heidelberger, P. and Blumrich, M.A. and Wisniewski, R.W. and Gara, A. and Chiu, G.L.-T. and Boyle, P.A. and Chist, N.H. and Changhoan Kim}, 
		journal={Micro, IEEE}, title={The IBM Blue Gene/Q Compute Chip}, 
		year={2012}, 
		month={march-april }, 
		volume={32}, 
		number={2}, 
		pages={48 -60}, 
		doi={10.1109/MM.2011.108}, 
		ISSN={0272-1732},
}

@ARTICLE{chen:micro12, 
		author={Dong Chen and Eisley, N.A. and Heidelberger, P. and Senger, R.M. and Sugawara, Y. and Kumar, S. and Salapura, V. and Satterfield, D. and Steinmacher-Burow, B. and Parker, J.}, 
		journal={Micro, IEEE}, title={The IBM Blue Gene/Q Interconnection Fabric}, 
		year={2012}, 
		month={jan.-feb. }, 
		volume={32}, 
		number={1}, 
		pages={32 -43}, 
		doi={10.1109/MM.2011.96}, 
		ISSN={0272-1732},
}

@techreport{alexandrov:95,
		author = {Alexandrov, Albert and Ionescu, Mihai F. and Schauser, Klaus E. and Scheiman, Chris},
		title = {LogGP: Incorporating Long Messages into the LogP Model --- One step closer towards a realistic model for parallel computation},
		year = {1995},
		publisher = {University of California at Santa Barbara},
		address = {Santa Barbara, CA, USA},
} 

@techreport{vishnu:icpp12tr,
		author = {Abhinav Vishnu and Jeffrey Daily and Bruce Palmer},
		title = {Scalable PGAS Communication Subsystem on Cray Gemini Interconnect},
		year = {2012},
		publisher = {Pacific Northwest National Laboratory},
		address = {Richland, WA, USA},
} 


@techreport{chavarria:ccgrid12,
		author = {Daniel Chavarria and Sriram Krishnamoorthy and Abhinav Vishnu},
		title = {Global Futures: A Multithreaded Execution Model for Global Arrays Based Applications},
		year = {2012},
		booktitle = {Proceedings of the 2012 International Conference on Cluster, Cloud and Grid Computing}
} 

@inproceedings{plasma,
		author = {Haidar, Azzam and Ltaief, Hatem and Dongarra, Jack},
		title = {Parallel reduction to condensed forms for symmetric eigenvalue problems using aggregated fine-grained and memory-aware kernels},
		booktitle = {Proceedings of 2011 International Conference for High Performance Computing, Networking, Storage and Analysis},
		series = {SC '11},
		year = {2011},
		articleno = {8},
		numpages = {11},
		doi = {10.1145/2063384.2063394}
} 

@misc{dague,
		  author =       "{Jack Dongarra et al.}",
			title = "{Directed Acyclic Graph Unified Environment}",
		  howpublished = "http://icl.cs.utk.edu/dague/"
}

@inproceedings{pritchard:eurompi11,
		         author = {Pritchard, Howard and Gorodetsky, Igor and Buntinas, Darius},
				           title = "{A uGNI-based MPICH2 nemesis network module for the cray XE}",
						              booktitle = {Proceedings of the 18th European MPI Users' Group conference on Recent advances in the message passing interface},
									              series = {EuroMPI'11},
												               year = {2011},
															                 isbn = {978-3-642-24448-3},
																			                location = {Santorini, Greece},
																							                pages = {110--119},
																											                 numpages = {10}
} 
@inproceedings{sun:ipdps12,
		          author = "Yanhua Sun and Gengbin Zheng and L. V. Kale and Terry R. Jones and Ryan Olson",
				              title = "{A uGNI-based Asynchronous Message-driven Runtime System \\ for Cray Supercomputers with Gemini Interconnect}",
							                booktitle = "Proceedings of 26th IEEE International Parallel and Distributed Processing Symposium (IPDPS)",
											                year = "2012",
															                  month = "May",
																			                      address = {Shanghai, China},
}

